
*want to define aggregated occuaption classifications
	*blue collar: over 50% male and under 40% college degree in 2000:
	//construction, installation, transport, farming, protection, proudction, building maintenance
	*pink collar: over 50% female and under 40% college degree in 2000: [excluding OAS]
	//health support, personal care, foodprep sales
	*white collar male: over 50% male and over 40% college degree in 2000 
	//archetectire, computer occs, mgmt, legal, physical sciences, arts and design
	*white collar female: over 50% femae and over 40% college degree in 2000
	//health, education, community service, business 

	// Load Data
use age empstat classwkr year occ2010 sex educd perwt if year == 2000 using "$dir/data/data_public/census_1970_2000.dta", clear

		
		
	keep if age >=15 & age<65
	
		
	*want to exclude self-employed CLASSWKR == 1
	
	gen emp = (empstat == 1) if classwkr != 1 
	
	keep if emp ==1
	
	*empstat==1 means employed
	
	
		

	
	gen female = 0
	replace female = 1 if sex == 2
	

	
	
	gen college = (educd>=101) if educd!=.
	
	gen some_college = (educd>=64) if educd!=.
	
	
	gen major_occ = "Management" if  (occ2010 >=10    & occ2010 <430)
	replace major_occ = "Business"         if (occ2010 >=500   & occ2010 <1000)
	replace  major_occ = "Computer/Math"            if (occ2010 >=1000  & occ2010 <1300)
	replace  major_occ = "Engineering"           if (occ2010 >=1300  & occ2010 <1600)
	replace  major_occ = "Science"      if (occ2010 >=1600  & occ2010 <2000)
	replace  major_occ = "Social Services"       if (occ2010 >=2000  & occ2010 <2100)
	replace  major_occ = "Legal"              if (occ2010 >=2100  & occ2010 <2200)
	replace  major_occ = "Education"          if (occ2010 >=2200  & occ2010 <2600)
	replace  major_occ = "Arts"          if (occ2010 >=2600  & occ2010 <3000)
	replace  major_occ = "Health"               if (occ2010 >=3000  & occ2010 <3540)
	
	replace  major_occ = "Health Support"         if (occ2010 >=3600  & occ2010 <3700)
	replace  major_occ = "Protection"         if (occ2010 >=3700  & occ2010 <4000)
	replace  major_occ = "Food Prep"          if (occ2010 >=4000  & occ2010 <4200)
	replace  major_occ = "Maintenance"      if (occ2010 >=4200  & occ2010 <4300)
	replace  major_occ = "Personal Care"        if (occ2010 >=4300  & occ2010 <4700)
	replace  major_occ = "Sales"              if (occ2010 >=4700  & occ2010 <5000)
	replace  major_occ = "OAS"             if (occ2010 >=5000  & occ2010<6000)
	
	replace  major_occ = "Farming"               if (occ2010 >=6000  & occ2010<6200)
	replace  major_occ = "Construction"              if (occ2010 >=6200  & occ2010 <6940)
	replace  major_occ = "Installation"      if (occ2010 >=7000  & occ2010<7700)
	
	replace  major_occ = "Production"         if (occ2010 >=7700  & occ2010 <9000)
	replace  major_occ = "Transport"          if (occ2010 >=9000  & occ2010 <9750)
	
drop if educd==.
drop if sex == .
	
	collapse female college some_college (sum) emp [pw = perwt], by(major_occ)
	
	drop if major_occ == ""
	save "$dir\data\interim\occs_female_college.dta", replace
	
